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Trivial scheduler 


class TrivialSched: 


Thread myThread; 
Mutex myLock ; 
ConditionVariable myCond; 
List<Callback> myQueue; 


TrivialSched::Post(const Callback& aFunc) 
d 
myLock.Lock(); 
myQueue.Append(aFunc) ; 
myCond.Signal(); 
myLock.Unlock(); 
} 


TrivialSched::Run() 
d 
while(!IsStopped()) { 
myLock.Lock(); 
while (myQueue.IsEmpty()) 
myCond.Wait(); 
Callback cb = myQueue.Pop(); 
myLock.Unlock(); 


cb.Execute(); 


Trivial scheduler 


class TrivialSched: TrivialSched::Post (const Callback& aFunc) 
Thread myThread; { 
Mutex myLock; N myLock.Lock(); 
ConditionVariable myCond; myQueue .Append(aFunc) ; 
List<Callback> myQueue; myCond.Signal(); 


myLock.Unlock(); 


} 
Single thread 


TrivialSched::Run() 


d 
while(!IsStopped()) { 
myLock.Lock(); 
while (myQueue.IsEmpty()) 
NK. myCond.Wait(); 
Callback cb = myQueue.Pop(); 
myLock.Unlock(); 
cb.Execute(); 
i 
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Trivial scheduler 


class TrivialSched: TrivialSched::Post (const Callback& aFunc) 
Thread myThread; í 
Mutex myLock ; myLock.Lock(); Append 
ConditionVariable myCond; myQueue . Append (aFunc); under a lock 
List<Callback> myQueue; myCond.Signal(); 
myLock.Unlock(); 
} 
Single thread 
TrivialSched::Run() 
d 
while(!IsStopped()) { Pop under a 
myLock .Lock (); K lock 
Simple locked while (myQueue.IsEmpty()) 
myCond.Wait(); 
queue Callback cb = myQueue.Pop(); 
myLock.Unloc ; 
cb.Execute(); 
} 
} 


Trivial scheduler 


class TrivialSched: TrivialSched::Post (const Callback& aFunc) 
Thread myThread; í 
Mutex myLock ; myLock.Lock(); 
ConditionVariable myCond; myQueue .Append(aFunc) ; 
List<Callback> myQueue ; myCond.Signal(); 


myLock.Unlock(); 


} 
Single thread 


TrivialSched::Run() 


í 
while(!IsStopped()) { 
myLock .Lock (); 


Simple locked while (myQueue.IsEmpty()) 
myCond.Wait(); 
queue Callback cb = myQueue.Pop(); 


myLock.Unlock(); 


cb.Execute(); Execute one 
by one 
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Lock-free atomics 


Atomically get the old | AtomicLoad(var) 
í * Google "memory models" 


value return var; about why it has to be atomic 


AtomicCompareExchange (var, new value, check) 


Atomically set if the old 


value equals something if (var != check) 
return false; 
var = new value; 

return true; 


Atomically set a new AtomicExchange (var, new value) 


d 
value and get the old Sat = var 
value var = new value; 


return old value; 
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Front queue 


Multi-Producer-Single-Consumer* 


e] E-==——————— | 
All threads Sched-worker 


* Common notation for queues: 
MPSC, MPMC, SPSC, SPMC 
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> | |! 
= Multi-Producer-Single-Consumer 
ER E ee 
= ) All threads Sched-worker 


NormalQueue: :Push(T* aItem) 


{ 
if (myHead == nullptr) 
myHead = aItem; 
else 
myTail->myNext = altem; 
myTail = alten; 
} 
NormalQueue: :Pop() 
{ 
if (myHead == nullptr) 
return nullptr; 
T* res = myHead; 
myHead = res->myNext; 
return res; 
} 


High 
contention 


Normally a queue 
needs 2 members: 
head and tail 
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= ) All threads Sched-worker 


NormalQueue: :Push(T* aItem) 


{ 
if (myHead == nullptr) 
myHead = aItem; 
else 
myTail->myNext = altem; 
myTail = aItem; A 
} 
NormalQueue: :Pop() 
{ 
if (myHead == nullptr) 
rn nullptr; 
T* res = myHead; 
myHead = res->myNext; 
return fes; 
} 


High 
contention 


Doing it in a lock-free 
way is hardly possible 
- too many variables 
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MPSCQueue: :Push(T* altem) 


{ 


T* oldTop; 

do { 
oldTop = AtomicLoad(myTop) ; 
altem->myNext = oldTop; 

} while (not AtomicCompareExchange ( 
myTop, altem, oldTop)); 


MPSCQueue: :PopAll(T* altem) 


{ 


T* top = AtomicExchange(myTop, nullptr); 
return ReverseList(top); 


High 
contention 


Make ita stack to 
reduce the number of 
variables 
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class MPSCQueue: 


MPSCQueue: :Push(T* altem) 
T* myTop; 


d 
T* oldTop; 
do í 


oldTop = AtomicLoad (myTop) ; 
eege = oldTop; 

} while (not AtomicCompareExchange ( 
myTop, altem, oldTop)); 


MPSCQueue: :PopAll(T* altem) 

{ 
T* top = AtomicExchange (myTop, nullptr); 
return ReverseList(top); 


High 
contention 


Retry atomic push of 
anew top. Stack 
grows 


SPO JS) Front queue High 
FD 


Multi-Producer-Single-Consumer contention 
= $ — ee nr. | 
=) All threads Sched-worker 
class MPSCQueue: MPSCQueue: :Push(T* altem) 
T* myTop; { 

T* oldTop; 

do { 
oldTop = AtomicLoad(myTop) ; 
altem->myNext = oldTop; 

} while (not AtomicCompareExchange ( 
myTop, altem, oldTop) ); Pop takes all and 

} turns stack to queue 


MPSCQueue: :PopAll(T* altem) 
{ 


T* top = AtomicExchange(myTop, nullptr); 
return ReverseList(top); 


SPO ASS) Front queue 
=p 


Multi-Producer-Single-Consumer 


EN ee oe, .. a 
mm ) All threads Sched-worker 
class MPSCQueue: MPSCQueue: :Push(T* altem) 
T* myTop; { 
T* oldTop; 
do { 


oldTop = AtomicLoad(myTop); 
altem->myNext = oldTop; 

} while (not AtomicCompareExchange ( 
myTop, altem, oldTop)); 


MPSCQueue: :PopAll(T* altem) 

{ 
T* top = AtomicExchange (myTop, nullptr); 
return ReverseList(top); 


High 
contention 
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There is no simple unbounded lock-free MCSP queue 
* Google "ABA-problem" about why 


Ready queue High 
> Multi-Consumer Consumer-Single-Producer contention 
` Allthreads  Sched-worker 


There is no simple unbounded lock-free MCSP queue 
* Google "ABA-problem" about why 


But there are these: 
Unbounded lock-based Bounded lock-free MCSP 
MCSP queue queue 
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class LockFreeBounded: 
uint64 myIdxBegin; 
uint64 myIdxEnd; 
uint32 mySize; 

T* myBuffer; 


Cyclic array with 
atomic indexes 
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LockFreeBounded: :Push(T* altem) 


{ 


uint64 idxEnd = AtomicLoad(myIdxEnd) ; 

if (idxEnd - AtomicLoad(myIdxBegin) == mySize) 
return false; 

myBuffer[idxEnd % mySize] = altem; 

AtomicExchange (myIdxEnd, idxEnd + 1); 


LockFreeBounded: : Pop() 


d 


T* res; 

do { 
uint64 idxBegin = AtomicLoad(myIdxBegin); 
if (idxBegin == AtomicLoad(myIdxEnd) ) 


return nullptr; 
res = myBuffer[idxBegin % mySize]; 
} while (not AtomicCompareExchange ( 
myIdxBegin, idxBegin + 1, idxBegin)); 
return res; 


Ready queue - Bounded Lock-Free 


class LockFreeBounded: LockFreeBounded: : Push(T* altem) 
uint64 myIdxBegin; { 
uint64 myIdxEnd; uint64 idxEnd = AtomicLoad (myIdxEnd) ; 
uint32 mySize; if (idxEnd - AtomicLoad(myIdxBegin) == mySize) 


T* myBuffer; return false; 
myBuffer[idxEnd % mySize] = altem; 


AtomicExchange(myIdxEnd, idxEnd + 1); 


LockFreeBounded: : Pop( ) 


Single producer t 
: T* res; 
atomically bumps do { 
'end index: uint64 idxBegin = AtomicLoad(myIdxBegin); 


if (idxBegin == AtomicLoad(myIdxEnd) ) 
return nullptr; 
res = myBuffer[idxBegin % mySize]; 
} while (not AtomicCompareExchange ( 
myIdxBegin, idxBegin + 1, idxBegin)); 
return res; 
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class LockFreeBounded: 
uint64 myIdxBegin; 
uint64 myIdxEnd; 
uint32 mySize; 
T* myBuffer; 


Consumers read by 
atomically incremented 
'begin index' 
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LockFreeBounded: :Push(T* altem) 


{ 


uint64 idxEnd = AtomicLoad(myIdxEnd) ; 

if (idxEnd - AtomicLoad(myIdxBegin) == mySize) 
return false; 

myBuffer[idxEnd % mySize] = altem; 

AtomicExchange (myIdxEnd, idxEnd + 1); 


LockFreeBounded: : Pop() 


d 


T* res; 
do { 
uint64 idxBegin = AtomicLoad(myIdxBegin); 
if (idxBegin == AtomicLoad(myIdxEnd)) R, 


return nullptr; 
res = myBuffer[idxBegin % mySize]; 
yi while (not AtomicCompareExchange ( 
myIdxBegin, idxBegin + 1, idxBegin)); 
return res; 


Ready queue - Unbounded Locked 


class LockedUnbounded: 
Mutex myLock ; 
List<T> myQueue; 


/ 


Trivial mutex and list 


LockedUnbounded: :Push(T* altem) 


{ 


} 


myLock.Lock (); 
myQueue.Append (altem); 
myLock.Unlock(); 


LockedUnbounded: : Pop() 


d 


myLock.Lock(); 
T* res = nullptr; 
if (myQueue.IsEmpty()) 
res = myQueue.PopFirst(); 
myLock.Unlock(); 
return res; 


Ready queue - Unbounded Locked 


class LockedUnbounded: LockedUnbounded: : Push(T* altem) 
Mutex myLock ; í 
List<T> myQueue; myLock.Lock(); 
myQueue.Append (altem); 

myLock.Unlock(); 


} 


LockedUnbounded: : Pop() 


d 
Lock on push and pop myLock .Lock () ; DÁ 


T* res = nullpt 
if (myQueue.IsEmpty()) 


res = myQueue.PopFirst(); 
myLock.Unlock(); E. 


== — PP PP PPP EE EE EEE 
return res; E 


Ready queue 


O) UBISOFT 


Ready queue 


A mas e E 
ait ridge ANNA A O suður 
Ke e £ s R Sage a el card 


nn 
ar 


Armead 


k F 7 SP a EE. 
Togo en Pra on d 1 
ii a A IG N 


Ready queue 


Lock-free 


Ready queue 


Lock-based queue of lock-free queues 


Lock-free 


Lock-protected 


Ready queue 


Lock-based queue of lock-free queues 


Single 
producer 
O 


Lock-free 
AB A A AAA O AAN) (o) (0) (O} IO 
E 


Lock-protected 


O) UBISOFT 


Ready queue 


Lock-based queue of lock-free queues 


Single 
producer 
O 


Lock-free 


oloo) OOIOIO 


VAV 


OO000"10 


Lock-protected 


Multiple 
consumers 


Ready queue 


Lock-based queue of lock-free queues 


Lock is taken once per 
sub-queue size 


Single 
producer 
O 


Lock-free 


olol) OOIOIO 


VAV 


OO000"10 


Lock-protected 


Multiple 
consumers 


Ready queue 


Lock-based queue of lock-free queues 


Lock is taken once per Consumers need an 


À SCH Single 
sub-queue size explicit state 


producer 
O 


Lock-free 


olol) OOIOIO 


VAV 


(O}O}{O}(O} MO, 


Lock-protected 


Multiple 
consumers 


Ready queue example 


O) UBISOFT 


Ready queue example 


O) UBISOFT 


Ready queue example 


O) UBISOFT 


Ready queue example 


BWA 


©) UBISOFT 


Ready queue example 


O) UBISOFT 


Ready queue example 


O) UBISOFT 


Ready queue example 


O) UBISOFT 


Ready queue example 


TOND 
BWA 


©) UBISOFT 


Ready queue example 


TOn 
BWA 


© UBISOFT 


Ready queue example 


eJlleJleJleja |9)(9)(9)( | 


B A 


O) UBISOFT 


Ready queue example 


0000 SEEN 


«E = 


O) UBISOFT 


Ready queue example 


gogogo STA 


= 


© UBISOFT 


Ready queue example 


00/06/60 JO/OIOIG 
B A 


©) UBISOFT 


Ready queue example 


oJlleJleJleja |8)(9)(9)( __ 
B A 


O) UBISOFT 


Ready queue example 


A A 


O) UBISOFT 


Ready queue example 


0000 SEEN 


E. Li 


O) UBISOFT 


Ready queue example 


0000 EEEN 


E 


O) UBISOFT 


O) UBISOFT 


Ready queue example 


ELEC 


PB 


Ready queue example 


00100 10008 
À £ 


O) UBISOFT 


Ready queue example 


O) UBISOFT 


Our progress 


@ Task scheduling 
© Typical solutions 
© New task scheduler 
TaskScheduler parts Gär" O Scheduling gears 

Verification 


Benchmarks 


Future plans 


Our progress 


@ Task scheduling 
Ó Typical solutions 
Ó New task scheduler 
| Scheduling gears 
Coroutines Q Verification 

Benchmarks 


Future plans 


O) UBISOFT 


Coroutines 


Start a 
download 


Handle the 
© 


Coroutines 


Need to step away to 
let other tasks work 


AR Handle the © 
download result 


Coroutines 


Need some timeout 


for the waiting 
AR Handle the © 
download result 


N_/ 


Need to step away to 
let other tasks work 


Coroutines 


Need some timeout 
for the waiting 


ET 


Need to step away to 
let other tasks work 


Need to wakeup when 
get a response 


Coroutines 


Need some timeout 
for the waiting 


ET 


Need to step away to 
let other tasks work 


download 


Can yield 


Can set a 


deadline Need to wakeup when 


get a response 


Can be woken 
up explicitly 


O) UBISOFT 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download(t): 
t->SetCallback(HandleResult) ; 
http->GetAsync(url, { 

sched.Wakeup(t); 
HG 


sched.PostDeadline(t, now + 5 sec); 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download (t): 
Prepare the next —> t->SetCallback(HandleResult) ; 


step http->GetAsync (url, { 
sched.Wakeup(t); 
}); 


sched.PostDeadline(t, now + 5 sec); 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download (t) : Send an async 
t->SetCallback(HandleResult) ; 


http->GetAsync(url, { I< request, 
sched.Wakeup(t) ; wakeu on 

ESSE PO 

sched.PostDeadline(t, now + 5 sec); completion 
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TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download(t): 
t->SetCallback(HandleResult) ; 
http->GetAsync(url, { 

sched.Wakeup(t); 
i i HG 
Yield until +5 — >> sched.PostDeadline(t, now + 5 sec); 
secs or wakeup 
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Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download(t): 
t->SetCallback(HandleResult) ; 
http->GetAsync(url, { 

sched.Wakeup(t) ; 
+); 
sched.PostDeadline(t, now + 5 sec); 

HandleResult(t): 

if (t->IsExpired()) { 
http->Cancel(); 
sched.PostWait(t); 
return; 

} 

if (http->IsSuccess()) 
HandleSuccess(); 

else 
HandleFailure(); 

delete t; 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download(t): 
t->SetCallback(HandleResult) ; 
http->GetAsync(url, { 

sched.Wakeup(t); 
HG 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 
if (t->IsExpired()) { Check ifthe 


http->Cancel(); : : 

sched.PostWait(t); deadline IS up. 
, return; Cancel then 
if (http->IsSuccess()) 

HandleSuccess(); 
else 


HandleFailure(); 
delete t; 


Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download(t): 
t->SetCallback(HandleResult) ; 
http->GetAsync(url, { 

sched.Wakeup(t); 
HG 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 
if (t->IsExpired()) ( 
http->Cancel(); 
sched.PostWait(t); 


Not expired = return; 
} 
completed. =— 3: 1f (http->IsSuccess()) 
Handle it HandleSuccess(); 


else 
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Coroutines 


TaskScheduler sched; 
HTTPClient http; 


MyTask *t = new MyTask(); 
t->SetCallback (Download); 
sched.Post (t); 


Download(t): 
t->SetCallback(HandleResult) ; 
http->GetAsync (url, { 

sched.Wakeup(t); 
+); 
sched.PostDeadline(t, now + 5 sec); 

HandleResult(t): 

if (t->IsExpired()) (í 
http->Cancel(); 
sched.PostWait(t); 


return; 

} 

if (http->IsSuccess()) Completely lock- 
HandleSuccess(); 

else free, very low 


O) UBISOFT HandleFailure(); overhead 


delete t; 


How to verify a 
multithreaded 
algorithm? 


TLA+ Verification 


Temporal Logic of Actions 


Math logic with "time" 
concept 


TLA+ Verification 


Temporal Logic of Actions 


Math logic with "time" 
Language Runtime 
concept 
Fullscan and _ Fullscan and checking | 


CONSTANT Count 
CONSTANT Lim 
VARIABLES Pipe, 
LastReceived, 
LastSent 


Decide on 
granularity of 
the system: 
objects, actions 
on them 


O) UBISOFT 


TLA+ Example 


TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
EE /\ LastSent = 0 Actions consist of 
LastSent 


conditions. First 
is usually "init" 


CONSTANT Count 

CONSTANT Lim 

VARIABLES Pipe, 
LastReceived, 
LastSent 


TLA+ Example 


Init == 
/N Pipe = << >> 
/\ LastReceived = 0 


/\ LastSent = 0 Actions consist of 
conditions. First 


Examples of | na 
is usually "init" 


expressions: 


X and Y are true: XAY 


List of items x, y, 2: 


<<x, Y, Z>> (x, y, 2) 


X = Yy 


All items in set Y are equal 10: 
VA x Vin Y: x = 10 
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LastReceived = 0 
LastSent = 0 


Len(Pipe) < Lim 
LastSent < Count 
Pipe' = Append(Pipe, 
LastSent' = LastSent 


LastSent + 1) 
+1 


TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 
/N LastSent < Count 
iti /\ Pipe' = Append(Pipe, LastSent + 1) 
Conditions for /N LastSent' = LastSent + 1 
the action to be 


possible 


TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 

/N LastSent < Count 

Pipe' = Append(Pipe, LastSent + 1) 
/N LastSent' = LastSent + 1 


Conditions which 
"change" the 
state if the action 
is possible 
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TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 
/N LastSent < Count 


/N Pip = end(Pipe, LastSent + 1) 
/\ L “K LastSent + 1 


Single quote _'_ 
Next value of X equals X + 1: 
refers to the next , _ 4 4 
value of the 
variable 


TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 

/N LastSent < Count 

/N Pipe' = Append(Pipe, LastSent + 1) 
/N LastSent' = LastSent + 1 


Recv == 
/N Len(Pipe) > 0 
/N LastReceived' = Head(Pipe) 
/N Pipe' = Tail(Pipe) 


TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 
/N LastSent < Count 


/N Pipe' = Append(Pipe, LastSent + 1) 
/N LastSent' = LastSent + 1 
Recv == 
/N Len(Pipe) > 0 
/N LastReceived' = Head(Pipe) 
/N Pipe' = Tail(Pipe) 
PipeInvariant == 
IN MA à Nin 1..Len(Pipe) - 1: Pipe[i] + 1 = Pipe[i + 1] 


/N Len(Pipe) =< Lim 
/N N/ Len(Pipe) = 0 
\/ Pipe[1] = LastReceived + 1 


TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 
/N LastSent < Count 


/N Pipe' = Append(Pipe, LastSent + 1) 
/N LastSent' = LastSent + 1 
Recv == 
/N Len(Pipe) > 0 
/N LastReceived' = Head(Pipe) 
Items are /N Pipe' = Tail(Pipe) 
ordered 
PipeInvariant == 
IN MA à Nin 1..Len(Pipe) - 1: Pipe[i] + 1 = Pipe[i + 1] 


/\ Len(Pipe) =< Lim 
/\ \/ Len(Pipe) = 0 
\/ Pipe[1] = LastReceived + 1 
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TLA+ Example 


CONSTANT Count Init == 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 
/N LastSent < Count 


/N Pipe' = Append(Pipe, LastSent + 1) 
/N LastSent' = LastSent + 1 
Recv == 
/N Len(Pipe) > 0 
/N LastReceived' = Head(Pipe) 
/N Pipe' = Tail(Pipe) 
PipeInvariant == 
IN MA à Nin 1..Len(Pipe) - 1: Pipe[i] + 1 = Pipe[i + 1] 
The queue never —/\ Len(Pipe) =< Lim 
Len(Pipe) = 0 
overflows \/ Pipe[1] = LastReceived + 1 
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TLA+ Example 


CONSTANT Count Init = 
CONSTANT Lim /N Pipe = << >> 
VARIABLES Pipe, /N LastReceived = 0 
LastReceived, /N LastSent = 0 
LastSent 
Send == 


/N Len(Pipe) < Lim 
/N LastSent < Count 


/N Pipe' = Append(Pipe, LastSent + 1) 
/N LastSent' = LastSent + 1 
Recv == 

/N Len(Pipe) > 0 

/N LastReceived' = Head(Pipe) 

/N Pipe' = Tail(Pipe) 
The first item is Pipelnvariant == ` ` 

IN MA à Nin 1..Len(Pipe) - 1: Pipe[i] + 1 = Pipe[i + 1] 
always the next /N Len(Pipe) =< Lim 


/\ N/ Len(Pipe) = 0 


to receive (or the \/ Pipe[1] = LastReceived + 1 


queue is empty) 


O) UBISOFT 


TaskScheduler TLA+ 


MCSP queue spec: -430 lines 
/tla/MCSPQueue.tla 


TaskScheduler spec: ~750 lines 
/tla/TaskScheduler.tla 


How to run it: 
/tla/README.md 


Study TLA+, great course from its author: 


lamport.azurewebsites.net/tla/tla. html 
(O) veisorr 
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e 5 push-threads 
e ~9 min/sec 
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Comparative - algorithm vs its naive trivial version 


Example: Debian Linux, 8 cores, 2.3GHz, hyperthreading 


e 5 push-threads 
e -9 min/sec 
x1.5 faster vs trivial 


e 10 push-threads 
e ~5.8 min/sec 
x2.6 faster vs trivial 


Benchmarks - parts 


Comparative - algorithm vs its naive trivial version 
Example: Debian Linux, 8 cores, 2.3GHz, hyperthreading 


Ready Queue 


5 push-threads 
-9 min/sec 


x1.5 faster vs trivial SBN 7D 
=p ) => ( >) 
e 10 push-threads <> > ) 


~5.8 min/sec 


5 pop-threads 
~2.5 min/sec 
x2.6 faster vs trivial 

x0.0009 lock-contention 


x2.6 faster vs trivial 


Benchmarks - parts 


Comparative - algorithm vs its naive trivial version 
Example: Debian Linux, 8 cores, 2.3GHz, hyperthreading 


Ready Queue 


5 push-threads 
-9 min/sec 


x1.5 faster vs trivial DANNE LSD 
=P | D =o ) 
10 push-threads <> y m aÀ 


~5.8 min/sec 


5 pop-threads 
e -2.5 min/sec 
e x2.6 faster vs trivial 

x0.0009 lock-contention 


10 pop-threads 
-1.7 min tasks/sec 
x4.5 faster vs trivial 
x0.0007 lock-contention 


x2.6 faster vs trivial 


Benchmarks - scheduler 
Example: Debian Linux, 8 cores, 2.3GHz, hyperthreading 


Benchmarks - scheduler 
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1 worker 

-11 min/sec 

x2.2 faster vs trivial 
x0 lock-contention 


Benchmarks - scheduler 


Example: Debian Linux, 8 cores, 2.3GHz, hyperthreading 


1 worker 

-11 min/sec 

x2.2 faster vs trivial 
x0 lock-contention 


5 workers 

~4 min/sec 

x3 faster vs trivial 
x0.002 lock-contention 


Benchmarks - scheduler 


Example: Debian Linux, 8 cores, 2.3GHz, hyperthreading 


1 worker 
-11 min/sec 
x2.2 faster vs trivial 


x0 lock-contention 


5 workers 

~4 min/sec 

x3 faster vs trivial 
x0.002 lock-contention 


10 workers 

-5.2 min/sec 

X7.5 faster vs trivial 
x0.003 lock-contention 


Real usage 


Savegame blobs multistep processing 


Real usage 


Savegame blobs multistep processing 


Debian Linux, 8 cores, 2.3GHz, hyperthreading 


"Updater": "TaskScheduler": 


e 4 workers => e 4 workers 
e -100-300 RPS e >10000 RPS 


e -500 ms latency X10 speed e -100 ms latency 


up right away 


Real usage 


Savegame blobs multistep processing 


Debian Linux, 8 cores, 2.3GHz, hyperthreading 


"Updater": "TaskScheduler": 


e 4 workers => e 4 workers 
e -100-300 RPS e >10000 RPS 


e -500 ms latency X10 speed e -100 ms latency 


up right away 
The algorithm is extendible 


oS) This is a thread-safe 
box. Can do here 


=$ ) anything, not just 


D) deadlines. Like add epoll a 


To MN 
) 


NA 
O) UBISOFT or IOCP 


Future plans 


Try on ARM 
Other languages 


Optimizations 


TLA+ specs and C++ code: 


github.com/ubisoft/ 
task-scheduler 


My talks (and this one too): 


slides.com/gerold103/ 
taskscheduler-highload2022-eng 
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How do the 
workers sleep? 


Smart usage of 
cmpxchg() 


Coroutine 
Wakeup vs Signal 


Additional content 


Signal 


Threads shouldn't poll 


Signal 


An event storage 


Threads shouldn't poll 


Signal 


Threads shouldn't poll 
An event storage 


Signal sig; 
bool hasEvent = false; 


Thread 1: Thread 2: 
hasEvent = _ — sig.BlockingReceive() 
sig.Send(); assert(hasEvent); 
// Won't receive again: 
assert(sig.IsEmpty()); 
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Signal 


An event storage 


Usual implementation 


class Signal: 
Mutex myLock; 
ConditionVariable myCond; 
bool myFlag; 


Threads shouldn't poll 


Signal 


Threads shouldn't poll 
An event storage 


Usual implementation 


class Signal: 
Mutex myLock; 
ConditionVariable myCond; 
bool myFlag; 


Signal: :Send() Signal: :BlockingReceive() 
d d 
myLock.Lock(); myLock.Lock(); 
myFlag = true; while (not myFlag) 
myCond.Signal(); myCond.Wait(); 
myLock.Unlock(); myFlag = false; 
H myLock.Unlock(); 
} 
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Signal 


Threads shouldn't poll 
An event storage 


Usual implementation 


class Signal: 
Mutex myLock; 
ConditionVariable myCond; 
bool myFlag; 


Signal::Send() Signal::BlockingReceive() 
d Expensive 1 
myLock . Lock () ; E mutex lock myLock.Lock () L 
myFlag = true; while (not myFlag) 
myCond.Signal(); on each myCond.Wait(); 
myLock.Unlock(); operation myFlag = false; 


} Ro myLock.Unlock(); 4 
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Signal 


Threads shouldn't poll 
An event storage 


Lock-free receipt if 
already signaled 


class Signal: 
Mutex myLock; 
ConditionVariable myCond; 
bool myFlag; 


Signal: :Send() Signal: :BlockingReceive() 
d d 
myLock.Lock (); if (AtomicExchange (myFlag, false)) 
AtomicExchange (myFlag, true); return; 
myCond.Signal(); myLock.Lock(); 
myLock.Unlock(); while (not AtomicExchange (myFlag, false)) 
} myCond.Wait(); 


myLock.Unlock(); 
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Signal 


An event storage 


Threads shouldn't poll 


Lock-free receipt if 
already signaled 


Lock-free send if 


k san. already signaled 
Mutex myLock; 
ConditionVariable myCond; 


bool myFlag; 


Signal::BlockingReceive( ) 


Signal::Send() 
í í 


if (AtomicExchange (myFlag, true)) if (AtomicExchange(myFlag, false)) 
return; return; 


myLock.Lock(); 


myLock.Lock(); 
while (not AtomicExchange(myFlag, false)) 


myCond.Signal(); 


myLock.Unlock(); myCond.Wait(); 


myLock.Unlock(); 
} 


O) UBISOFT 


Smart usage of cmpxchg 


AtomicCompareExchange (var, new value, check) 


d 
if (old value == check) 
return false; 
var = new value; 
return true; 
} 


Smart usage of cmpxchg 


AtomicCompareExchangeGetOld (var, new value, check) 


d 
if (old value == check) 
var = new value; 

} 
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Smart usage of cmpxchg 


AtomicCompareExchangeGetOld (var, new value, check) 


d 
if (old value == check) 
return 
var = new value; 
SEH 
} 
AtomicCompareExchange (var, new_value, check) 
{ 
return AtomicCompareExchangeGetOld ( 
val, new_value, check) == check; 
} 
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Smart usage of cmpxchg 


class MPSCQueue: MPSCQueue: :Push(T* altem) 
T* myTop; { 
T* oldTop; 
do { 


oldTop = AtomicLoad(myTop); 
altem->myNext = oldTop; 

} while (not AtomicCompareExchange ( 
myTop, altem, oldTop)); 


MPSCQueue: :PopAll(T* altem) 

{ 
T* top = AtomicExchange (myTop, nullptr); 
return ReverseList(top); 


Smart usage of cmpxchg 


class MPSCQueue: MPSCQueue: :Push(T* altem) 


T* myTop; { 
T* oldTop; 
do { 
oldTop = AtomicLoad(myTop); 
altem->myNext = oldTop; 
} while (not AtomicCompareExchange ( 
myTop, altem, oldTop)); 
} 


MPSCQueue: :PopAll(T* altem) 
{ 


T* top = AtomicExchange (myTop, nullptr); 
return ReverseList(top); 


Smart usage of cmpxchg 


class MPSCQueue: MPSCQueue: :Push(T* altem) 
T* myTop; { 
T* oldTop; 
Load the top —A T* res = AtomicLoad(myTop) ; 
once aoi 


oldTop = res; 
aItem->myNext = oldTop; 
res = AtomicCompareExchangeGetOld(myTop, altem, oldTop); 


Atomically retry 
setting a new top and 
getting the old one 


}| while (res != oldTop); 


MPSCQueue: :PopAll(T* altem) 


{ 
T* top = AtomicExchange (myTop, nullptr); 


Back return ReverseList(top); 
} 


Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download (t): 
t->SetCallback (HandleResult); 
http->GetAsync (url, 
í 
http->SetReady(); 
sched.Wakeup(t); 
}); 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 

if (http->IsReady()) 

í 
Process (http->GetResult()); 
delete t; 
return; 

} 

http->Cancel(); 

sched.PostWait(t); 
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Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download (t): 
t->SetCallback (HandleResult); 
http->GetAsync (url, 


í 
http->SetReady(); 
sched.Wakeup(t); 
}); 
sched.PostDeadline(t, now + 5 sec); Check the 
completion 
HandleResult(t): 
if (http->IsReady()) before the 
í expiration 


Process (http->GetResult()); 
delete t; 
return; 


http->Cancel(); 
sched.PostWait(t); 


O) UBISOFT 


Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download(t): The code will 
t->SetCallback(HandleResult) ; eventually crash 
http->GetAsync (url, 
{ here 


http->SetReady(); 
sched.Wakeup(t); 
+); 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 

if (http->IsReady()) 

í 
Process (http->GetResult()); 
delete t; 
return; 

} 

http->Cancel(); 

sched.PostWait(t); 


Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download (t): 
t->SetCallback (HandleResult); HTTP threads set 
ready' flag 


http->GetAsync (url, 


http->SetReady(); 
sched.Wakeup(t); 


Thread A 


oo o. 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 

if (http->IsReady()) 

í 
Process (http->GetResult()); 
delete t; 
return; 

} 

http->Cancel(); 

sched.PostWait(t); 


Task signal 


TaskScheduler sched; 
HTTPClient http; 
Scheduler thread 
Download (t): 
t->SetCallback (HandleResult); wakes Up by 


http->GetAsync (url, timeout and 
deletes the task 


http->SetReady(); 
sched.Wakeup(t); 


Thread A 


Ooo 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 
if (http->IsReady()) 
í 


Process (http->GetResult()); 
Thread B delete t; 
return; 
} 
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http->Cancel(); 
sched.PostWait(t); 


Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download (t): 
t->SetCallback (HandleResult); 
http->GetAsync (url, 


http->SetReady (); 
Thread A sched.Wakeup(t); 
sched.PostDeadline(t, now + 5 sec); 
HandleResult(t): 
if (http->IsReady () ) 
{ 
Process (http->GetResult()); 
Thread B delete t; 


return; 
} 
http->Cancel(); 
sched.PostWait(t); 
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HTTP thread uses a 
deleted task 


Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download (t): 
t->SetCallback (HandleResult); 
http->GetAsync (url, 
í 
sched.Signal(t); 
}); 


sched.PostDeadline(t, now + 5 sec); 


HandleResult(t): 

if (t->ReceiveSignal()) 

í 
Process (http->GetResult()); 
delete t; 
return; 

} 

http->Cancel(); 

sched.PostWait(t); 
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Task signal 


TaskScheduler sched; 
HTTPClient http; 


Download (t): 
t->SetCallback (HandleResult); 
http->GetAsync (url, 


í 
sched.Signal(t); 
Signal Is atomic dE Port beddline ct: now + 5 sec); 


"wakeup + set flag" 


HandleResult(t): 

if (t->ReceiveSignal 

{ 
Process(http->GetResult()); 
delete t; 
return; 

} 

http->Cancel(); 

sched.PostWait(t); 
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